# -*- coding: utf-8 -*-
# html parser来解析html

from html.parser import HTMLParser
from html.entities import name2codepoint

class MyHtmlParser(HTMLParser):

	def handle_starttag(self,tag,attrs):
		print('<%s>' % tag)

	def hanle_endtag(self,tag,attrs):
		print('</%s>' % tag)

	def handle_startendtag(self,tag,attrs):
		print('<%s/>' % tag)

	def handle_data(self,data):
		print(data)

	def handle_comment(self,data):
		print('<!--', data, '-->')

	def handle_entityref(self,name):
		print('&%s,' % name)

	def handle_charref(self,name):
		print('&#%s:' % name)

parser = MyHtmlParser()
parser.feed('''<html>
<head></head>
<body>
<!-- test html parser -->
    <p>Some <a href=\"#\">html</a> HTML&nbsp;tutorial...<br>END</p>
</body></html>''')

# feed()